[1]:
from ckg.graphdb_builder import builder_utils
[2]:
example_file = 'tmp/example_PXD022733.mzTab'
[4]:
data = builder_utils.parse_mztab_file(example_file)
[6]:
print(data.keys())
dict_keys(['MTD', 'PRT', 'PSM'])
[8]:
data['PRT'].head()
[8]:
accession description taxid species database database_version search_engine best_search_engine_score[1] search_engine_score[1]_ms_run[1] search_engine_score[1]_ms_run[2] ... num_peptides_unique_ms_run[254] num_peptides_unique_ms_run[255] num_peptides_unique_ms_run[256] num_peptides_unique_ms_run[257] num_peptides_unique_ms_run[258] num_peptides_unique_ms_run[259] ambiguity_members modifications protein_coverage opt_global_cv_MS:1002217_decoy_peptide
0 A0A075B6I9 sp|A0A075B6I9|LV746_HUMAN Immunoglobulin lambd... null null null null [MS, MS:1002337, Andromeda, 1.6.8.0] 2.54172068110967 null null ... null null null null null null A0A075B6I9, P04211 null 0.137 0
1 A0A075B6K5 sp|A0A075B6K5|LV39_HUMAN Immunoglobulin lambda... null null null null [MS, MS:1002337, Andromeda, 1.6.8.0] 12.3898963082584 null null ... null null null null null null A0A075B6K5, P80748 null 0.139 0
2 A0A075B6P5 sp|A0A075B6P5|KV228_HUMAN Immunoglobulin kappa... null null null null [MS, MS:1002337, Andromeda, 1.6.8.0] 37.2781261617028 null null ... null null null null null null A0A075B6P5, A0A087WW87, P01615, P01614, A2NJV5... null 0.167 0
3 A0A0C4DH67 sp|A0A0C4DH67|KV108_HUMAN Immunoglobulin kappa... null null null null [MS, MS:1002337, Andromeda, 1.6.8.0] 2.75929244987718 null null ... null null null null null null A0A0C4DH67, A0A0C4DH69, A0A075B6S5 null 0.139 0
4 A0A0A0MRZ8 sp|A0A0A0MRZ8|KVD11_HUMAN Immunoglobulin kappa... null null null null [MS, MS:1002337, Andromeda, 1.6.8.0] 10.1196640910864 null null ... null null null null null null A0A0A0MRZ8, P04433 null 0.322 0

5 rows × 1048 columns